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extern "C" void 

sRGBColor( Color *pOut, Color *pln ) 
{ 

for ( int i = 0; i < 4; i++) 
{ 

float x = (*pln)[i]; 
if ( x < 0.03928f ) 

x = x/12.92f; 
else 

x = powf(((x + 0.055f)/1.055f), 2.4f); 
(*pOut)[i] = x; 



FIG. 3 



extern "C" void 

LinearTosRGBColor( Color *pOut, Color *pln ) 
{ 

// coarse approximation: weighted arithmetic mean between 
// x A 0.5 and x A 0.375 approximates x A (1/2.4) 
for ( int i = 0; i < 4; i++) 

{ 

float x = (*pln)[i]; 

float sqrtx = sqrtf(x); 

float sqrt3x = sqrtf(sqrtf(sqrtx)); 

float pow124 = 0.38f*sqrtx+0.62rsqrtx/sqrt3x; 

if ( x < 0.00304f ) 

x = 12.92f*x; 

else 

x = 1.055f*pow124-0.055f; 
(*pOut)[i]=x; 

} 

} 
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extern "C" void 

LinearTosRGBColor( Color *pOut, Color *pln ) 
{ 

// finer approximation that avoids taking 3 successive 
// square roots: apply one round of N-R to guess cube 
// root of x*sqrt(sqrt(x)) 
for ( int i = 0; i < 4; i++) 
{ 

float x = (*pln)[i]; 

float sqrtx = sqrtf(x); 

float sqrt2x = sqrtf(sqrtx); 

float appx = 0.78f*sqrtx+0.22f*sqrt2x; 

float num = x*sqrt2x; 

float cuberoot = (2*appx+(x*sqrt2x)/(appx*appx))/3.0f - 0.00025f; 
if(x<0.00304f ) 

x= 12.92f *x; 

else 

x = 1 .055f*cuberoot-0.055f; 
(*pOut)[i]=x; 

} 
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const declspec(align(16)) m128 Const039 = _mm_set1_ps( 

0.03928f ); 

const declspec(align(16)) m128 Constlnv1292 = _mm_set1 _ps( 

1.0f/12.92f ); 

const declspec(align(16)) m128 Const055 = _mm_set1_ps( 0.055f 

); 

const declspec(align(16)) m128 Constlnv1055 = _mm_set1_ps( 

1.0f/1.055f ); 

const declspec(align(16)) m128 Const1285 = _mm_set1 _ps( 

1.285f); 

const declspec(align(16)) m128 Const0285 = _mm_set1_ps( 

0.285f); 
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FIG. 6 



extern "C" void 

sRGBColor( Color *pOut, Color *pln ) 
{ 

// SIMD: compute BOTH answers and compose output using mask 

m128 ansBelowDelta = _mm_mul_ps( *( m128 *) pin, Constlnv1292 ); 

m128 x = _mm_mul_ps( Constlnv1055, _mm_add_ps( *( m128 *) pin, 

Const055 ) ); 

m128 sqrx = _mm_mul_ps( x, x ); 

m128 invsqrx = _mm_rcp_ps( sqrx ); 

m128 invsqrtx = _mm_rsqrt_ps( x ); 

m128 ansAboveDelta = _mm_div_ps( Const1285, 

_mm_mul_ps( invsqrx, _mm_add_ps( Const0285, invsqrtx ) ) ); 

m128 TruelfLTDelta = _mm_cmplt_ps( *( m128 *) pin, Const039 ); 

*( m128 *) pOut = _mm_or_ps( _mm_and_ps( TruelfLTDelta, ansBelowDelta 

). 

_mm_andnot_ps( TruelfLTDelta, ansAboveDelta ) ); 

} 
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FIG. 7 



const declspec(align(16)) m128 CONST00304 = jmm_set1_ps( 0.00304f ); 

const declspec(align(16)) m128 CONST1292 =_mm_set1_ps( 12.92f ); 

const declspec(align(16)) m128 CONST055 = _mm_set1_ps( 0.055f ); 

const _declspec(align(16)) m128 CONST1055 = _mm_set1_ps( 1 .055f ); 



const declspec(align(16)) m128 CONST078 = _mm_set1_ps( 0.78f ); 

const declspec(align(16)) m128 CONST1m078 = _mm_set1_ps( 1.0f-0.78f ); 



const declspec(align(16)) m128 CONST38 = _mm_set1_ps( 0.38f ); 

const declspec(align(16)) m128 CONST1m38 = J7im_set1_ps( 1.0f-0.38f ); 



extern "C rt void 

LinearTosRGBColor( Color *pOut, Color *pln ) 
{ 

m128 ansBelowDelta = _mm_mul_ps( *( m128 *) pin, CONST1292 ); 

m128 sqrtx = _mm_sqrt_ps( *( m128 *) pin ); 

m128 sqrt3x = _mm_sqrt_ps( _mm_sqrt_ps( sqrtx ) ); 

m128 pow124 = _mm_add_ps( _mm_mul jps{ CONST38, sqrtx ), 

_mm_divjDs( _mm_mul_ps( CONST1m38 t sqrtx ), sqrt3x ) ); 

m128 ansAboveDelta = _mm_sub_ps( _mm_mul_ps( CONST1055, pow124 ), CONST055 ); 

_m128 TruetfLTDelta = _mm_cmplt_ps( *(_m128 *) pin, CONST00304 ); 

*( m128 *) pOut = _mm_or_ps( _mm_and_ps( TruelfLTDelta, ansBelowDelta ), 

_mm_andnotjDs( TruelfLTDelta, ansAboveDelta ) ); 

} 
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_mm__set1 _ps( 0.00304f ); 
_mm_set1_ps( 12.92f ); 
mm_set1_ps( 0.055f ); 
mm_set1 _ps( 1.055f ); 
mm_set1 _ps( 1.0f/3.0f ); 
_mm_set1_ps( 0.00025f ); 

const declspec(align(16)) m128 Magic078 = _mm_set1 _ps( 0.78f ); 

const dec!spec(align(16)) rn128 Magic! m078 = _mm_set1_ps( 1 .0f-0.78f ); 

const declspec(align(16)) m128 Magic38 = _mm_set1_ps( 0.38f ); 

const declspec(align(1 6)) m128 Magid m38 = _mm_set1 _ps( 1 .0f-0.38f ); 

extern "C" void 

LinearTosRGBColor( Color *pOut, Color *pln ) 
{ 

m128 ansBelowDelta = _mm__mulj3s( *( m128 *) pin, Magid 292 ); 

m128 sqrtx = _mm_sqrt_ps( *( m128 *) pin ); 

m128 sqrt2x = _mm_sqrt_ps( sqrtx ); 

m128 appx = _mm_add_ps( _mm_mul_ps( Magic078, sqrtx ), 

_mm_mul_ps( Magid m078, sqrt2x ) ); 

m128 cuberoot = _mm_sub_ps( 

_mm_mul_ps( Magiclnv3, 
_mm_add_ps( _mm_add_ps( appx, appx ), 

_mm_div_ps( _mm_mul_ps( *( m128 *) pin, sqrt2x ), 

_mm_mul_ps( appx, appx ) 

) 

) 

), MagicFudge 

); 

m128 ansAboveDelta = _mm sub_ps( _mm_mul_ps( Magid 055, cuberoot ), Magic055 ); 

m128 TruelfLTDelta = _mm_cmplt_ps( *( m128 *) pin, Magic00304 ); 

*( m128 *) pOut = _mm_or_ps( _mm_and_ps( TruelfLTDelta, ansBelowDelta ), 

_mm_andnot_ps( TruelfLTDelta, ansAboveDelta ) ); 

} 
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const declspec(align(16)) m128 Magic00304 = 

const decispec(align(16)) m128 Magid 292 = _ 

const declspec(align(16)) m128 Magic055 =_ 

const declspec(align(16)) m128 Magid 055 = _ 

const declspec(align(16)) m128 Magiclnv3 = _ 

const declspec(align(16)) m128 MagicFudge = 
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